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ocketO -> sf_socket (domain , service, protocol) 

if (this is a TCP socket) { 

if (called for the first time) { 

perform SAN transport initialization; 
Start up SAN Transport; 

fd = socket (domain, service, protocol) 
Note fd of first socket call; 
return (fd) ; 



else { 

fd = socket (doitiain ; service, protocol) 
return (f d) ; 



return (socket (domain, service, protocol) 



else 




bind() -> sfjbind (fd, sockaddr, addrlen) { 

Note IP address & port #; 

if (this is a TCP socket) { 

if (port is specified) 

note fd as service fd for this port; 

return (bind (fd, sockaddr, addrlen)); 



else 

return (bind (fd r sockaddr, addrlen) ) ; 





connect () sf_connect (fd, sockaddr , addrlen) { 

Note IP address & port #; 

if (this is a TCP socket) { 

if (this is a non-blocking socket) { 

if ( CONNECT I ON_RE QUE ST msg not previously sent for this fd) 
send CONNECTIONLESS QUE ST msg with fd to proxy node; 

if (ACCEPT_CONNECTION or RE JECT_CONNECTION msg is pending) { 

if (receive ACCEPT_CONNECTION msg) { 

assign mapped fd by mapping OS-assigned fd to a transport fd; 

return (success) ; 

} 

else 

return (connection refused error) ; 

} 

else 

return (connection in progress) ; 

} 

else { 

send CONNE CTION__RE QUE ST msg with fd to proxy node; 

wait to receive (ACCEPT_CONNECTION or RE JECT_CONNECTION msg) ; 

if (receive ACCEPT CONNECTION msg) { 

assign mapped fd by mapping OS-assigned fd to a transport fd; 

return (success) ; 
} 

else 

return (connection refused error) ; 

} 



else 

return (connect {fd, sockaddr,, addrlen)) 



listen () — > sf_listen(fd, backlog) { 



switch (type of fd) { 

case service fd: 

send J0INJ3ERVXCE msg; 
return (success) ; 

case mapped fd: 

case transport fd: 

return (exception error) ; 

default: 

return ( listen (fd, backlog)) 




accept () --> sf_accept (fd, clientaddr, len) { 

switch (type of fd) { 

case service fd: 

if (this is a non-biocking socket) { 

if CONNECTION_REQUEST msg is pending for this service fd { 

read CONNECTION_REQUEST msg with proxy-assigned flow xd; 

if (connection can be accepted) { 
send ACCEPT_CONNECTION msg; 
return (flow id) ; 

} 

else { 

send REJECT_CONNECTION msg; 
return {try again) ; 

} 

} 

else 

return (try again) ; 

} 

else { 

while (1) { 

if CONNECTION_REQUEST msg is pending for this service fd { 

read CONNECTION_REQUEST msg with proxy-assigned flow id; 

if (connection can be accepted) { 
send ACCEPT_CONNECTION msg; 
return (flow id) ; 

} 

else { 

send RE JECT_CONNECTION msg; 

} 

} 

else 

wait to receive CONNECTION_REQUEST msg; 
} / / while loop 



case transport fd: 

return (exception error) ; 

default: 

return ( accept (fd, clientaddr, len) ) ; 

} 



} 
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select {) -> sf_select (nfds, readfds, writefds, exceptfds, timeout) { 
note the number of fds to select on; 

set timeslice as a function of timeout and number of fds; 

do forever { 

// PHASE 1: POLL ALL FDs 

for each service fd m readfds { 

if CONNECT ION_REQUE ST msg is pending for this service fd 

set corresponding service fd as available; 

} 

for each transport fd in readfds { 

if DATA msg is pending for this transport fd 
set corresponding transport fd as available ; 

} 

for each mapped fd m readfds { 

perform mapping to transport fd; 
if DATA msg is pending for this transport fd 
set corresponding mapped fd as available; 

} 



for each transport fd in writefds { 

if DATA msg can be sent on this transport fd 
set corresponding transport fd as available; 

} 

for each mapped fd in writefds { 
perform mapping to transport fd; 
if DATA msg can be sent for this transport fd 
set corresponding mapped fd as available ; 

} 

for each service fd in exceptfds { 

if exception occurs for this service fd 
set corresponding service fd; 

} 

for each transport fd in exceptfds { 

if exception occurs for this transport fd 
set corresponding transport fd; 

} 

for each mapped fd in exceptfds { 
perform mapping to transport fd; 
if exception occurs for this transport fd 
set corresponding mapped fd; 

} 

for al other fds 

call original system select () ; 

combine all available descriptors; 

if (one or more descriptors are ready) 

return (number of descriptors available); 
else 

choose one descriptor m readfds to wait on; // heuristic-based choice 

restore original descriptor sets; 

if (time is up AND no fd is available) 
return (timed out) ; 

// PHASE 2: WAIT if necessary 

wait for arrival of CONNECTION_REQUEST , ACCEPT_CONNECTION, 

RE JE CT_CONNE C T I ON or DATA msg for the chosen descriptor, up to timeslice 

} 

} 
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recvO -> sf_recv (fd, buf, len, flags) { 

switch (type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if ( M S G_W A I T AL L flag is not set) { 

if at least one DATA msg is pending for this transport fd { 
receive data into buf; 
return (number of bytes read) ; 

} 

else { 

if (this is a non-blocking socket) 

return (resource not available) ; 
else { 

wait to receive a DATA msg for this transport fd; 

receive data into buf; 

return (number of bytes read) ; 

} 

} 

else { 

wait until all len bytes of DATA msgs for this transport fd arri 

receive data into buf; 

return (number of bytes read) ; 

} 

default: 

return ( recv (fd, buf, len)); 

} 

} 



send() sf_send (fd, buf, len, flags) { 

switch (type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if (this is a non-blocking socket) { 

if (no DATA msg can be sent at this time) 

return (try again) ; 
else 

send DATA msg(s) with data from buf in non-blocking fashion 
else { 

if ( no DATA msg can be sent at this time) 

Wait until atleast one DATA msg can be sent; 
send DATA msg(s) with data from buf; 

} 

return (number of bytes sent) ; 

default : 

return (send (fd, buf, len)); 





read() -> sf_read (fd, buf, len) { 

switch {type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if at least one DATA msg is pending for this transport fd { 

receive dara into buf; 

return (number of bytes read) ; 

} 

else { 

if (this is a non-blocking socket) 
return {resource not available) ; 
else { 

wait to receive a DATA msg for this transport fd; 

receive data into buf; 

return (number of bytes read) ; 



default : 

return ( read (fd, buf, len)); 
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write () -> sf_write (fd, buf, len) { 



switch (type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if (this is a non-blocking socket) { 

if (no DATA msg can be sent at this time) 

return (try again) ; 
else 

send DATA msg(s) with data from buf m non-blocking fashion; 



if ( no DATA msg can be sent at this time) 

Wait until atleast one DATA msg can be sent; 
send DATA msg(s) with data from buf; 

} 

return (number of bytes written) ; 



else { 



default: 



return (write (fd, buf, len)); 





readv() -> sf_readv <fd, vector__buf, vector_count) { 

switch (type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if at least one DATA msg is pending for this transport fd { 
scatter data received into vector buf; 
return (number of bytes read) ; " 

} 

else { 

if (this is a non-blocking socket) 
return {resource not available) ; 
else { 

wait to receive a DATA msg for this transport fd; 

scatter data received into vector buf; 
return (number of bytes read) ; 



default: 



return ( readv (fd, buf, len) ) ; 




writev() -> sf_writev (fd, vectorjbuf, vector_count) { 

switch (type of fd) { 

case service fd: 

return (exception error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 



if (this is a non-blocking socket) { 

if (no DATA msg can be sent at zhis time) 

return (try again) ; 
else 

send DATA msg(s) with gathered data from vectorjbuf; 



else { 

if ( no DATA msg can be sent at this time) 

Wait until atleast one DATA msg can be sent; 
send DATA rnsg(s) with gathered data from vector ouf; 



return (number of bytes written) ; 



default: 



return (writev (fd, buf, len) ) ; 




ioctl() -> sf_ioctl (fd, request, arg) { 

switch (type of fd) { 

case service fd: 

return (socket not connected error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

switch (request) { 



case FIONBIO: 

set non-blocking I/O variable to value m arg; 

return (success); 
case FIOASYNC: 

set async I/O variable to value in arg; 

return (success) ; 
case FIONREAD: 

peek at DATA msg for this transport fd; 

set number of bytes in arg; 

return (success) ; 
default: 

return (warning: option not meaningful in SAN Transport) 



default : 



return (ioctl (fd, request, arg)); 





getsocknameO -> sf_getsockname (fd, localaddr, addrlen) { 

switch (type of fd) { 

case service fd: 

return (socket not connected error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

return (local protocol address associated with this transport fd) ; 



default: 



return (getsockname (fd, localaddr, addrlen)); 




getpeername ( ) -> sf_getpeername (fd, localaddr, addrlen) { 

switch (type of fd) { 

case service fd: 

return (socket not connected error) ; 

case mapped fd: 

perform mapping to transport fd; 

case transport fd: 

if (information is available from the proxy node) 



return (foreign protocol address associated with this transport fd) 



else 



return (address not available) ; 



default: 



return (getpeername (fd, localaddr, addrlen}); 
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getsockopt() ~> sf_getsockopt (fd, level, optname, optval, optlen) { 

if (level == SOL_SOCKET) { 
switch (type of fd) { 

case service fd: 

return (warning: setsockopt() not meaningful for service fd) ; 
case mapped fd: 

perform mapping to transport fd; 



case transport fd: 

switch (optname) { 
case SO_RCVBUF : 
case SO_SNDBUF: 

if (buffering supported by proxy node) { 

get corresponding state variable and place value m optval; 
return (success); 

} 

else 

return (unable to get buffer sizes); 

case SO_LINGER: 
case SOJRCVLOWAT: 
case SO_SNDLOWAT: 

get corresponding state variable and place value m optval; 
return (success); 
i*^ case SO_TYPE: 

return (SOCK_STREAM) ; 
default: 

'%! return (warning: option not meaningful m SAN Transport) ; 

IS default: 

hi return ( getsockopt ( f d, level, optname, optval, optlen} ); 

: s "; } 

""4. 

m > 

if (level == IPPROTO__TCP) { 
switch (type of fd) { 

II 5 

case service fd: 

fy return (warning: setsockopt() not meaningful for service fd) ; 

_;KSj case mapped fd: 

I"™ perform mapping to transport fd; 

case transport fd: 

switch (optname) { 
case TCP_MAXSEG: 

get segment size of SAN transport and place value m optval; 
return (success) ; 
case TCP_NODELAY: 

if (no-delay option is known) { 

get value and place in optval; 

return (success) ; 

} 

else 

return (error) ; 

default: 

return (warning: option not meaningful m SAN Transport) ; 



default: 

return ( getsockopt ( fd, level, optname, optval, optlen) ); 

} 

return {not implemented) ; 

} 



setsockopt() -> sf_setsockopt (fd, level, optname, optval, optlen) { 



} 



if (level -= SOL_SOCKET) { 
switch (type of fd) { 
case service fd: 

return (warning: setsockoptO not meamngfal for service fd) ; 
case mapped fd: 

perform mapping to transport fd; 
case transport fd: 

switch (optname) { 
case SO_RCVBUF : 
case SO_SNDBUF: 

if (buffering supported by proxy node) { 

set corresponding state variable to value given by optval; 
communicate buffer size given by optval to proxy node; 
if (communication successful) 

return (success) ; 
else 

return (unable to set buffer size); 

} 

else 

return (unable to sec buffer sizes); 

case SO_LINGER: 
case SO_RCVLOWAT: 
case SO_SND LOWAT : 

set corresponding state variable to value given by optval; 
communicate optname ana optval to proxy node; 
if (communication successful) 

return (success) ; 
else 

return (unable to set option) ; 
default : 

return (warning: option not meaningful m SAN Transport) ; 

} 

default: 

return ( setsockopt ( f d, level, optname, optval, optlen) ); 

} 

if (level == IPPROTO_TCP) { 
switch (type of fd) { 
case service fd: 

return {warning: setsockoptO not meaningful for service fd) ; 
case mapped fd: 

perform mapping to transport fd; 
case transport fd: 
switch (optname) { 
case TCP_MAXSEG: 

set segment size of SAN transport to value given by optval; 
return (success ) ; 
case TCP_NODELAY: 

set no-delay variable to value given by optval; 
communicate optname and optval to the proxy node; 
if (communication successful) 

return (success) ; 
else 

return (unable to set no-delay option); 
default: 

return (warning: option not meaningful m SAN Transport) ; 

default: 

return ( setsockopt ( fd, level, optname, optval, optlen) ); 

} 

return (not implemented) ; 
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close () -> sf_close (fd) { 



switch (type of fd) { 

case service fd: 

send LEAVE_SERVICE msg on service fd; 

clean up transport resources associated with this service; 
return (close {fd}); 

case mapped fd: 

perform mapping to transport fd; 

send CLOSE_CONNECTION msg on transport fd; 

reset fd mapping; 
return (close (fd)); 

case transport fd: 

send CLOSE_CONNECTION msg on transport fd; 



default: 



return (close (fd) ) ; 




shutdown () -> sfjshutdown (fd, howto) { 

if (howto = SHUT_RD) { 

if {fd already closed for writes) 
set full_shutdown_f lag to TRUE; 
else 

note that fd is closed for further reads; 

} 

if (howto == SHUTJ/fR) { 

if (fd already closed for reads) 

set full_shutdown_f lag to TRUE; 
else 

note that fd is closed for further writes ; 

} 

if (howto == SHUT_RDWR) { 

set full_shutdown_f lag to TRUE ; 

} 

if (full_shutdown_flag == TRUE) { 

switch (type of fd) { 
case service fd: 
^ send LEAVE_SERVICE msg on service fd; 

^ clean up transport resources associated with this service; 

]1 break; 

7$ case mapped fd: 

^ perform mapping to transport fd; 

2 send CLOSE_CONNECTION msg on transport fd; 

II reset fd mapping; 

. break; 

™ case transport fd: 

^ send CLOSE_CONNECTION msg on transport fd; 

y break; 

™ default: 

^ return ( shutdown (fd, hotwo) ) ; 

} 

return ( shutdown (fd, howto)); 
} 



